{
  "dataset_reader": {
    "class_name": "odqa_reader",
    "data_path": "",
    "save_path": "/data/odqa/userfile.db",
    "dataset_format": "wiki"
  },
  "dataset_iterator": {
    "class_name": "sqlite_iterator",
    "shuffle": false,
    "load_path": "/data/odqa/userfile.db"
  },
  "chainer": {
    "in": [
      "docs"
    ],
    "in_y": [
      "doc_ids",
      "doc_nums"
    ],
    "out": [
      "tfidf_doc_ids"
    ],
    "pipe": [
      {
        "class_name": "hashing_tfidf_vectorizer",
        "id": "vectorizer",
        "fit_on": [
          "docs",
          "doc_ids",
          "doc_nums"
        ],
        "save_path": "/data/odqa/userfile_tfidf_matrix.npz",
        "load_path": "/data/odqa/userfile_tfidf_matrix.npz",
        "tokenizer": {
          "class_name": "stream_spacy_tokenizer",
          "lemmas": true,
          "lowercase": true,
          "filter_stopwords": true,
          "ngram_range": [
            1,
            2
          ]
        }
      },
      {
        "class_name": "tfidf_ranker",
        "top_n": 12,
        "in": [
          "docs"
        ],
        "out": [
          "tfidf_doc_ids",
          "tfidf_doc_scores"
        ],
        "vectorizer": "#vectorizer"
      }
    ]
  },
  "train": {
    "batch_size": 10000,
    "evaluation_targets": [],
    "class_name": "fit_trainer"
  },
  "metadata": {
    "variables": {
      "ROOT_PATH": "~/.deeppavlov",
      "DOWNLOADS_PATH": "{ROOT_PATH}/downloads",
      "MODELS_PATH": "{ROOT_PATH}/models"
    },
    "download": [
      {
        "url": "http://files.deeppavlov.ai/datasets/wikipedia/enwiki.tar.gz",
        "subdir": "{DOWNLOADS_PATH}"
      },
      {
        "url": "http://files.deeppavlov.ai/deeppavlov_data/en_odqa.tar.gz",
        "subdir": "{MODELS_PATH}"
      }
    ]
  }
}